###Raw Whisper Transform
# ckp="/apdcephfs_qy3/share_976139/users/joyounglv/pretrained_ckpt/whisper-large-v3"
# TP=4
# out_path=whisper-large-v3-megatron-TP$TP-TE-v1
# python examples/audiollm/whisper_converter_v1.py --load $ckp --save $out_path --tensor-parallel-size $TP


###Qwen2Audio Transform
ckp="/apdcephfs_qy3/share_976139/users/adrenzhou/nlp_workdir/pretrained_models/Qwen/Qwen2-Audio-7B-Instruct"
TP=1
out_path=qwen2-audio-encoder-proj-7b-instruct-megatron-TP$TP-TE-v1
python examples/audiollm/whisper_converter_v1.py --load $ckp --save $out_path --tensor-parallel-size $TP --load-prefix "audio_tower." --save-prefix "speech_model"